{ "cells": [ { "cell_type": "markdown", "metadata": { "id": "Jic0H1XJ-qrc" }, "source": [ "**Chapter 2 – End-to-end Machine Learning project**\n", "\n", "*Welcome to Machine Learning Housing Corp.! Your task is to predict median house values in Californian districts, given a number of features from these districts.*\n", "\n", "*This notebook contains sample code from https://github.com/ageron/handson-ml2.*" ] }, { "cell_type": "markdown", "metadata": { "id": "Jv_2Nq2q-qre" }, "source": [ "
\n",
" | \n",
" \n",
" | \n",
"
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-122.23 | \n", "37.88 | \n", "41.0 | \n", "880.0 | \n", "129.0 | \n", "322.0 | \n", "126.0 | \n", "8.3252 | \n", "452600.0 | \n", "NEAR BAY | \n", "
1 | \n", "-122.22 | \n", "37.86 | \n", "21.0 | \n", "7099.0 | \n", "1106.0 | \n", "2401.0 | \n", "1138.0 | \n", "8.3014 | \n", "358500.0 | \n", "NEAR BAY | \n", "
2 | \n", "-122.24 | \n", "37.85 | \n", "52.0 | \n", "1467.0 | \n", "190.0 | \n", "496.0 | \n", "177.0 | \n", "7.2574 | \n", "352100.0 | \n", "NEAR BAY | \n", "
3 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1274.0 | \n", "235.0 | \n", "558.0 | \n", "219.0 | \n", "5.6431 | \n", "341300.0 | \n", "NEAR BAY | \n", "
4 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1627.0 | \n", "280.0 | \n", "565.0 | \n", "259.0 | \n", "3.8462 | \n", "342200.0 | \n", "NEAR BAY | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "
---|---|---|---|---|---|---|---|---|---|
count | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20433.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "20640.000000 | \n", "
mean | \n", "-119.569704 | \n", "35.631861 | \n", "28.639486 | \n", "2635.763081 | \n", "537.870553 | \n", "1425.476744 | \n", "499.539680 | \n", "3.870671 | \n", "206855.816909 | \n", "
std | \n", "2.003532 | \n", "2.135952 | \n", "12.585558 | \n", "2181.615252 | \n", "421.385070 | \n", "1132.462122 | \n", "382.329753 | \n", "1.899822 | \n", "115395.615874 | \n", "
min | \n", "-124.350000 | \n", "32.540000 | \n", "1.000000 | \n", "2.000000 | \n", "1.000000 | \n", "3.000000 | \n", "1.000000 | \n", "0.499900 | \n", "14999.000000 | \n", "
25% | \n", "-121.800000 | \n", "33.930000 | \n", "18.000000 | \n", "1447.750000 | \n", "296.000000 | \n", "787.000000 | \n", "280.000000 | \n", "2.563400 | \n", "119600.000000 | \n", "
50% | \n", "-118.490000 | \n", "34.260000 | \n", "29.000000 | \n", "2127.000000 | \n", "435.000000 | \n", "1166.000000 | \n", "409.000000 | \n", "3.534800 | \n", "179700.000000 | \n", "
75% | \n", "-118.010000 | \n", "37.710000 | \n", "37.000000 | \n", "3148.000000 | \n", "647.000000 | \n", "1725.000000 | \n", "605.000000 | \n", "4.743250 | \n", "264725.000000 | \n", "
max | \n", "-114.310000 | \n", "41.950000 | \n", "52.000000 | \n", "39320.000000 | \n", "6445.000000 | \n", "35682.000000 | \n", "6082.000000 | \n", "15.000100 | \n", "500001.000000 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|---|
20046 | \n", "-119.01 | \n", "36.06 | \n", "25.0 | \n", "1505.0 | \n", "NaN | \n", "1392.0 | \n", "359.0 | \n", "1.6812 | \n", "47700.0 | \n", "INLAND | \n", "
3024 | \n", "-119.46 | \n", "35.14 | \n", "30.0 | \n", "2943.0 | \n", "NaN | \n", "1565.0 | \n", "584.0 | \n", "2.5313 | \n", "45800.0 | \n", "INLAND | \n", "
15663 | \n", "-122.44 | \n", "37.80 | \n", "52.0 | \n", "3830.0 | \n", "NaN | \n", "1310.0 | \n", "963.0 | \n", "3.4801 | \n", "500001.0 | \n", "NEAR BAY | \n", "
20484 | \n", "-118.72 | \n", "34.28 | \n", "17.0 | \n", "3051.0 | \n", "NaN | \n", "1705.0 | \n", "495.0 | \n", "5.7376 | \n", "218600.0 | \n", "<1H OCEAN | \n", "
9814 | \n", "-121.93 | \n", "36.62 | \n", "34.0 | \n", "2351.0 | \n", "NaN | \n", "1063.0 | \n", "428.0 | \n", "3.7250 | \n", "278000.0 | \n", "NEAR OCEAN | \n", "
\n", " | Overall | \n", "Stratified | \n", "Random | \n", "Rand. %error | \n", "Strat. %error | \n", "
---|---|---|---|---|---|
1 | \n", "0.039826 | \n", "0.039729 | \n", "0.040213 | \n", "0.973236 | \n", "-0.243309 | \n", "
2 | \n", "0.318847 | \n", "0.318798 | \n", "0.324370 | \n", "1.732260 | \n", "-0.015195 | \n", "
3 | \n", "0.350581 | \n", "0.350533 | \n", "0.358527 | \n", "2.266446 | \n", "-0.013820 | \n", "
4 | \n", "0.176308 | \n", "0.176357 | \n", "0.167393 | \n", "-5.056334 | \n", "0.027480 | \n", "
5 | \n", "0.114438 | \n", "0.114583 | \n", "0.109496 | \n", "-4.318374 | \n", "0.127011 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "NaN | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "NaN | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "NaN | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "NaN | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "NaN | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "
---|---|---|---|---|---|---|---|---|---|
4629 | \n", "-118.30 | \n", "34.07 | \n", "18.0 | \n", "3759.0 | \n", "433.0 | \n", "3296.0 | \n", "1462.0 | \n", "2.2708 | \n", "<1H OCEAN | \n", "
6068 | \n", "-117.86 | \n", "34.01 | \n", "16.0 | \n", "4632.0 | \n", "433.0 | \n", "3038.0 | \n", "727.0 | \n", "5.1762 | \n", "<1H OCEAN | \n", "
17923 | \n", "-121.97 | \n", "37.35 | \n", "30.0 | \n", "1955.0 | \n", "433.0 | \n", "999.0 | \n", "386.0 | \n", "4.6328 | \n", "<1H OCEAN | \n", "
13656 | \n", "-117.30 | \n", "34.05 | \n", "6.0 | \n", "2155.0 | \n", "433.0 | \n", "1039.0 | \n", "391.0 | \n", "1.6675 | \n", "INLAND | \n", "
19252 | \n", "-122.79 | \n", "38.48 | \n", "7.0 | \n", "6837.0 | \n", "433.0 | \n", "3468.0 | \n", "1405.0 | \n", "3.1662 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "
---|---|---|---|---|---|---|---|---|
17606 | \n", "-121.89 | \n", "37.29 | \n", "38.0 | \n", "1568.0 | \n", "351.0 | \n", "710.0 | \n", "339.0 | \n", "2.7042 | \n", "
18632 | \n", "-121.93 | \n", "37.05 | \n", "14.0 | \n", "679.0 | \n", "108.0 | \n", "306.0 | \n", "113.0 | \n", "6.4214 | \n", "
14650 | \n", "-117.20 | \n", "32.77 | \n", "31.0 | \n", "1952.0 | \n", "471.0 | \n", "936.0 | \n", "462.0 | \n", "2.8621 | \n", "
3230 | \n", "-119.61 | \n", "36.31 | \n", "25.0 | \n", "1847.0 | \n", "371.0 | \n", "1460.0 | \n", "353.0 | \n", "1.8839 | \n", "
3555 | \n", "-118.59 | \n", "34.23 | \n", "17.0 | \n", "6592.0 | \n", "1525.0 | \n", "4459.0 | \n", "1463.0 | \n", "3.0347 | \n", "
\n", " | ocean_proximity | \n", "
---|---|
17606 | \n", "<1H OCEAN | \n", "
18632 | \n", "<1H OCEAN | \n", "
14650 | \n", "NEAR OCEAN | \n", "
3230 | \n", "INLAND | \n", "
3555 | \n", "<1H OCEAN | \n", "
19480 | \n", "INLAND | \n", "
8879 | \n", "<1H OCEAN | \n", "
13685 | \n", "INLAND | \n", "
4937 | \n", "<1H OCEAN | \n", "
4861 | \n", "<1H OCEAN | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity | \n", "rooms_per_household | \n", "population_per_household | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
17606 | \n", "-121.89 | \n", "37.29 | \n", "38.0 | \n", "1568.0 | \n", "351.0 | \n", "710.0 | \n", "339.0 | \n", "2.7042 | \n", "<1H OCEAN | \n", "4.625369 | \n", "2.094395 | \n", "
18632 | \n", "-121.93 | \n", "37.05 | \n", "14.0 | \n", "679.0 | \n", "108.0 | \n", "306.0 | \n", "113.0 | \n", "6.4214 | \n", "<1H OCEAN | \n", "6.00885 | \n", "2.707965 | \n", "
14650 | \n", "-117.2 | \n", "32.77 | \n", "31.0 | \n", "1952.0 | \n", "471.0 | \n", "936.0 | \n", "462.0 | \n", "2.8621 | \n", "NEAR OCEAN | \n", "4.225108 | \n", "2.025974 | \n", "
3230 | \n", "-119.61 | \n", "36.31 | \n", "25.0 | \n", "1847.0 | \n", "371.0 | \n", "1460.0 | \n", "353.0 | \n", "1.8839 | \n", "INLAND | \n", "5.232295 | \n", "4.135977 | \n", "
3555 | \n", "-118.59 | \n", "34.23 | \n", "17.0 | \n", "6592.0 | \n", "1525.0 | \n", "4459.0 | \n", "1463.0 | \n", "3.0347 | \n", "<1H OCEAN | \n", "4.50581 | \n", "3.047847 | \n", "
\n", " | mean_fit_time | \n", "std_fit_time | \n", "mean_score_time | \n", "std_score_time | \n", "param_max_features | \n", "param_n_estimators | \n", "param_bootstrap | \n", "params | \n", "split0_test_score | \n", "split1_test_score | \n", "split2_test_score | \n", "split3_test_score | \n", "split4_test_score | \n", "mean_test_score | \n", "std_test_score | \n", "rank_test_score | \n", "split0_train_score | \n", "split1_train_score | \n", "split2_train_score | \n", "split3_train_score | \n", "split4_train_score | \n", "mean_train_score | \n", "std_train_score | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.077983 | \n", "0.001933 | \n", "0.004822 | \n", "0.000110 | \n", "2 | \n", "3 | \n", "NaN | \n", "{'max_features': 2, 'n_estimators': 3} | \n", "-3.837622e+09 | \n", "-4.147108e+09 | \n", "-4.196408e+09 | \n", "-3.903319e+09 | \n", "-4.184325e+09 | \n", "-4.053756e+09 | \n", "1.519591e+08 | \n", "18 | \n", "-1.064113e+09 | \n", "-1.105142e+09 | \n", "-1.116550e+09 | \n", "-1.112342e+09 | \n", "-1.129650e+09 | \n", "-1.105559e+09 | \n", "2.220402e+07 | \n", "
1 | \n", "0.250305 | \n", "0.007294 | \n", "0.013293 | \n", "0.001032 | \n", "2 | \n", "10 | \n", "NaN | \n", "{'max_features': 2, 'n_estimators': 10} | \n", "-3.047771e+09 | \n", "-3.254861e+09 | \n", "-3.130196e+09 | \n", "-2.865188e+09 | \n", "-3.173856e+09 | \n", "-3.094374e+09 | \n", "1.327062e+08 | \n", "11 | \n", "-5.927175e+08 | \n", "-5.870952e+08 | \n", "-5.776964e+08 | \n", "-5.716332e+08 | \n", "-5.802501e+08 | \n", "-5.818785e+08 | \n", "7.345821e+06 | \n", "
2 | \n", "0.740687 | \n", "0.005654 | \n", "0.035537 | \n", "0.001816 | \n", "2 | \n", "30 | \n", "NaN | \n", "{'max_features': 2, 'n_estimators': 30} | \n", "-2.689185e+09 | \n", "-3.021086e+09 | \n", "-2.948330e+09 | \n", "-2.619995e+09 | \n", "-2.970968e+09 | \n", "-2.849913e+09 | \n", "1.626875e+08 | \n", "9 | \n", "-4.381089e+08 | \n", "-4.391272e+08 | \n", "-4.371702e+08 | \n", "-4.376955e+08 | \n", "-4.452654e+08 | \n", "-4.394734e+08 | \n", "2.966320e+06 | \n", "
3 | \n", "0.123405 | \n", "0.002662 | \n", "0.004790 | \n", "0.000186 | \n", "4 | \n", "3 | \n", "NaN | \n", "{'max_features': 4, 'n_estimators': 3} | \n", "-3.730181e+09 | \n", "-3.786886e+09 | \n", "-3.734515e+09 | \n", "-3.418747e+09 | \n", "-3.913907e+09 | \n", "-3.716847e+09 | \n", "1.631510e+08 | \n", "16 | \n", "-9.865163e+08 | \n", "-1.012565e+09 | \n", "-9.169425e+08 | \n", "-1.037400e+09 | \n", "-9.707739e+08 | \n", "-9.848396e+08 | \n", "4.084607e+07 | \n", "
4 | \n", "0.406428 | \n", "0.003815 | \n", "0.012748 | \n", "0.000478 | \n", "4 | \n", "10 | \n", "NaN | \n", "{'max_features': 4, 'n_estimators': 10} | \n", "-2.666283e+09 | \n", "-2.784511e+09 | \n", "-2.892276e+09 | \n", "-2.616813e+09 | \n", "-2.948207e+09 | \n", "-2.781618e+09 | \n", "1.268607e+08 | \n", "8 | \n", "-5.097115e+08 | \n", "-5.162820e+08 | \n", "-4.962893e+08 | \n", "-5.436192e+08 | \n", "-5.160297e+08 | \n", "-5.163863e+08 | \n", "1.542862e+07 | \n", "
5 | \n", "1.200080 | \n", "0.003086 | \n", "0.034590 | \n", "0.000606 | \n", "4 | \n", "30 | \n", "NaN | \n", "{'max_features': 4, 'n_estimators': 30} | \n", "-2.387153e+09 | \n", "-2.588448e+09 | \n", "-2.666426e+09 | \n", "-2.398071e+09 | \n", "-2.649316e+09 | \n", "-2.537883e+09 | \n", "1.214614e+08 | \n", "3 | \n", "-3.838835e+08 | \n", "-3.880268e+08 | \n", "-3.790867e+08 | \n", "-4.040957e+08 | \n", "-3.845520e+08 | \n", "-3.879289e+08 | \n", "8.571233e+06 | \n", "
6 | \n", "0.165869 | \n", "0.006028 | \n", "0.004667 | \n", "0.000078 | \n", "6 | \n", "3 | \n", "NaN | \n", "{'max_features': 6, 'n_estimators': 3} | \n", "-3.119657e+09 | \n", "-3.586319e+09 | \n", "-3.592772e+09 | \n", "-3.328934e+09 | \n", "-3.579607e+09 | \n", "-3.441458e+09 | \n", "1.893056e+08 | \n", "14 | \n", "-9.245343e+08 | \n", "-8.886939e+08 | \n", "-9.353135e+08 | \n", "-9.009801e+08 | \n", "-8.624664e+08 | \n", "-9.023976e+08 | \n", "2.591445e+07 | \n", "
7 | \n", "0.548989 | \n", "0.004696 | \n", "0.012454 | \n", "0.000123 | \n", "6 | \n", "10 | \n", "NaN | \n", "{'max_features': 6, 'n_estimators': 10} | \n", "-2.549663e+09 | \n", "-2.782039e+09 | \n", "-2.762720e+09 | \n", "-2.521134e+09 | \n", "-2.907667e+09 | \n", "-2.704645e+09 | \n", "1.471569e+08 | \n", "6 | \n", "-4.980344e+08 | \n", "-5.045869e+08 | \n", "-4.994664e+08 | \n", "-4.990325e+08 | \n", "-5.055542e+08 | \n", "-5.013349e+08 | \n", "3.100456e+06 | \n", "
8 | \n", "1.668515 | \n", "0.013649 | \n", "0.036802 | \n", "0.004247 | \n", "6 | \n", "30 | \n", "NaN | \n", "{'max_features': 6, 'n_estimators': 30} | \n", "-2.370010e+09 | \n", "-2.583638e+09 | \n", "-2.607703e+09 | \n", "-2.350953e+09 | \n", "-2.661059e+09 | \n", "-2.514673e+09 | \n", "1.285080e+08 | \n", "2 | \n", "-3.838538e+08 | \n", "-3.804711e+08 | \n", "-3.805218e+08 | \n", "-3.856095e+08 | \n", "-3.901917e+08 | \n", "-3.841296e+08 | \n", "3.617057e+06 | \n", "
9 | \n", "0.208969 | \n", "0.001108 | \n", "0.005141 | \n", "0.000918 | \n", "8 | \n", "3 | \n", "NaN | \n", "{'max_features': 8, 'n_estimators': 3} | \n", "-3.353504e+09 | \n", "-3.348552e+09 | \n", "-3.402843e+09 | \n", "-3.129307e+09 | \n", "-3.510047e+09 | \n", "-3.348850e+09 | \n", "1.241939e+08 | \n", "13 | \n", "-9.228123e+08 | \n", "-8.553031e+08 | \n", "-8.603321e+08 | \n", "-8.881964e+08 | \n", "-9.151287e+08 | \n", "-8.883545e+08 | \n", "2.750227e+07 | \n", "
10 | \n", "0.713209 | \n", "0.010426 | \n", "0.012501 | \n", "0.000150 | \n", "8 | \n", "10 | \n", "NaN | \n", "{'max_features': 8, 'n_estimators': 10} | \n", "-2.571970e+09 | \n", "-2.718994e+09 | \n", "-2.842317e+09 | \n", "-2.460258e+09 | \n", "-2.776666e+09 | \n", "-2.674041e+09 | \n", "1.392777e+08 | \n", "5 | \n", "-4.932416e+08 | \n", "-4.815238e+08 | \n", "-4.730979e+08 | \n", "-5.155367e+08 | \n", "-4.985555e+08 | \n", "-4.923911e+08 | \n", "1.459294e+07 | \n", "
11 | \n", "2.139435 | \n", "0.016860 | \n", "0.035008 | \n", "0.000378 | \n", "8 | \n", "30 | \n", "NaN | \n", "{'max_features': 8, 'n_estimators': 30} | \n", "-2.357390e+09 | \n", "-2.546640e+09 | \n", "-2.591972e+09 | \n", "-2.318617e+09 | \n", "-2.527022e+09 | \n", "-2.468328e+09 | \n", "1.091662e+08 | \n", "1 | \n", "-3.841658e+08 | \n", "-3.744500e+08 | \n", "-3.773239e+08 | \n", "-3.882250e+08 | \n", "-3.810005e+08 | \n", "-3.810330e+08 | \n", "4.871017e+06 | \n", "
12 | \n", "0.120023 | \n", "0.004007 | \n", "0.005649 | \n", "0.000089 | \n", "2 | \n", "3 | \n", "False | \n", "{'bootstrap': False, 'max_features': 2, 'n_est... | \n", "-3.785816e+09 | \n", "-4.166012e+09 | \n", "-4.061751e+09 | \n", "-3.675704e+09 | \n", "-4.089667e+09 | \n", "-3.955790e+09 | \n", "1.900964e+08 | \n", "17 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "0.000000e+00 | \n", "0.000000e+00 | \n", "
13 | \n", "0.389255 | \n", "0.002722 | \n", "0.015147 | \n", "0.000292 | \n", "2 | \n", "10 | \n", "False | \n", "{'bootstrap': False, 'max_features': 2, 'n_est... | \n", "-2.810721e+09 | \n", "-3.107789e+09 | \n", "-3.131187e+09 | \n", "-2.788537e+09 | \n", "-3.099347e+09 | \n", "-2.987516e+09 | \n", "1.539234e+08 | \n", "10 | \n", "-6.056477e-02 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-2.967449e+00 | \n", "-6.056027e-01 | \n", "1.181156e+00 | \n", "
14 | \n", "0.155958 | \n", "0.002980 | \n", "0.005564 | \n", "0.000132 | \n", "3 | \n", "3 | \n", "False | \n", "{'bootstrap': False, 'max_features': 3, 'n_est... | \n", "-3.618324e+09 | \n", "-3.441527e+09 | \n", "-3.554815e+09 | \n", "-3.619116e+09 | \n", "-3.449864e+09 | \n", "-3.536729e+09 | \n", "7.795057e+07 | \n", "15 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-6.072840e+01 | \n", "-1.214568e+01 | \n", "2.429136e+01 | \n", "
15 | \n", "0.511048 | \n", "0.003302 | \n", "0.015071 | \n", "0.000156 | \n", "3 | \n", "10 | \n", "False | \n", "{'bootstrap': False, 'max_features': 3, 'n_est... | \n", "-2.757999e+09 | \n", "-2.851737e+09 | \n", "-2.830927e+09 | \n", "-2.672765e+09 | \n", "-2.786190e+09 | \n", "-2.779924e+09 | \n", "6.286720e+07 | \n", "7 | \n", "-2.089484e+01 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-5.465556e+00 | \n", "-5.272080e+00 | \n", "8.093117e+00 | \n", "
16 | \n", "0.194758 | \n", "0.005894 | \n", "0.005798 | \n", "0.000415 | \n", "4 | \n", "3 | \n", "False | \n", "{'bootstrap': False, 'max_features': 4, 'n_est... | \n", "-3.134040e+09 | \n", "-3.559375e+09 | \n", "-3.440422e+09 | \n", "-3.053647e+09 | \n", "-3.338344e+09 | \n", "-3.305166e+09 | \n", "1.879165e+08 | \n", "12 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "0.000000e+00 | \n", "0.000000e+00 | \n", "
17 | \n", "0.641786 | \n", "0.006101 | \n", "0.014823 | \n", "0.000179 | \n", "4 | \n", "10 | \n", "False | \n", "{'bootstrap': False, 'max_features': 4, 'n_est... | \n", "-2.525578e+09 | \n", "-2.710011e+09 | \n", "-2.609100e+09 | \n", "-2.439607e+09 | \n", "-2.725548e+09 | \n", "-2.601969e+09 | \n", "1.088048e+08 | \n", "4 | \n", "-0.000000e+00 | \n", "-1.514119e-02 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-0.000000e+00 | \n", "-3.028238e-03 | \n", "6.056477e-03 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "median_house_value | \n", "ocean_proximity | \n", "income_cat | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "-122.23 | \n", "37.88 | \n", "41.0 | \n", "880.0 | \n", "129.0 | \n", "322.0 | \n", "126.0 | \n", "8.3252 | \n", "452600.0 | \n", "NEAR BAY | \n", "5 | \n", "
1 | \n", "-122.22 | \n", "37.86 | \n", "21.0 | \n", "7099.0 | \n", "1106.0 | \n", "2401.0 | \n", "1138.0 | \n", "8.3014 | \n", "358500.0 | \n", "NEAR BAY | \n", "5 | \n", "
2 | \n", "-122.24 | \n", "37.85 | \n", "52.0 | \n", "1467.0 | \n", "190.0 | \n", "496.0 | \n", "177.0 | \n", "7.2574 | \n", "352100.0 | \n", "NEAR BAY | \n", "5 | \n", "
3 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1274.0 | \n", "235.0 | \n", "558.0 | \n", "219.0 | \n", "5.6431 | \n", "341300.0 | \n", "NEAR BAY | \n", "4 | \n", "
4 | \n", "-122.25 | \n", "37.85 | \n", "52.0 | \n", "1627.0 | \n", "280.0 | \n", "565.0 | \n", "259.0 | \n", "3.8462 | \n", "342200.0 | \n", "NEAR BAY | \n", "3 | \n", "
\n", " | Description | \n", "Value | \n", "
---|---|---|
0 | \n", "session_id | \n", "123 | \n", "
1 | \n", "Target | \n", "median_house_value | \n", "
2 | \n", "Original Data | \n", "(20640, 11) | \n", "
3 | \n", "Missing Values | \n", "True | \n", "
4 | \n", "Numeric Features | \n", "8 | \n", "
5 | \n", "Categorical Features | \n", "2 | \n", "
6 | \n", "Ordinal Features | \n", "False | \n", "
7 | \n", "High Cardinality Features | \n", "False | \n", "
8 | \n", "High Cardinality Method | \n", "None | \n", "
9 | \n", "Transformed Train Set | \n", "(16512, 18) | \n", "
10 | \n", "Transformed Test Set | \n", "(4128, 18) | \n", "
11 | \n", "Shuffle Train-Test | \n", "True | \n", "
12 | \n", "Stratify Train-Test | \n", "['income_cat'] | \n", "
13 | \n", "Fold Generator | \n", "KFold | \n", "
14 | \n", "Fold Number | \n", "10 | \n", "
15 | \n", "CPU Jobs | \n", "-1 | \n", "
16 | \n", "Use GPU | \n", "False | \n", "
17 | \n", "Log Experiment | \n", "True | \n", "
18 | \n", "Experiment Name | \n", "ca_housing | \n", "
19 | \n", "USI | \n", "f856 | \n", "
20 | \n", "Imputation Type | \n", "simple | \n", "
21 | \n", "Iterative Imputation Iteration | \n", "None | \n", "
22 | \n", "Numeric Imputer | \n", "median | \n", "
23 | \n", "Iterative Imputation Numeric Model | \n", "None | \n", "
24 | \n", "Categorical Imputer | \n", "constant | \n", "
25 | \n", "Iterative Imputation Categorical Model | \n", "None | \n", "
26 | \n", "Unknown Categoricals Handling | \n", "least_frequent | \n", "
27 | \n", "Normalize | \n", "True | \n", "
28 | \n", "Normalize Method | \n", "zscore | \n", "
29 | \n", "Transformation | \n", "False | \n", "
30 | \n", "Transformation Method | \n", "None | \n", "
31 | \n", "PCA | \n", "False | \n", "
32 | \n", "PCA Method | \n", "None | \n", "
33 | \n", "PCA Components | \n", "None | \n", "
34 | \n", "Ignore Low Variance | \n", "False | \n", "
35 | \n", "Combine Rare Levels | \n", "False | \n", "
36 | \n", "Rare Level Threshold | \n", "None | \n", "
37 | \n", "Numeric Binning | \n", "False | \n", "
38 | \n", "Remove Outliers | \n", "False | \n", "
39 | \n", "Outliers Threshold | \n", "None | \n", "
40 | \n", "Remove Multicollinearity | \n", "False | \n", "
41 | \n", "Multicollinearity Threshold | \n", "None | \n", "
42 | \n", "Remove Perfect Collinearity | \n", "True | \n", "
43 | \n", "Clustering | \n", "False | \n", "
44 | \n", "Clustering Iteration | \n", "None | \n", "
45 | \n", "Polynomial Features | \n", "False | \n", "
46 | \n", "Polynomial Degree | \n", "None | \n", "
47 | \n", "Trignometry Features | \n", "False | \n", "
48 | \n", "Polynomial Threshold | \n", "None | \n", "
49 | \n", "Group Features | \n", "False | \n", "
50 | \n", "Feature Selection | \n", "False | \n", "
51 | \n", "Feature Selection Method | \n", "classic | \n", "
52 | \n", "Features Selection Threshold | \n", "None | \n", "
53 | \n", "Feature Interaction | \n", "False | \n", "
54 | \n", "Feature Ratio | \n", "False | \n", "
55 | \n", "Interaction Threshold | \n", "None | \n", "
56 | \n", "Transform Target | \n", "False | \n", "
57 | \n", "Transform Target Method | \n", "box-cox | \n", "
\n", " | Model | \n", "MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "TT (Sec) | \n", "
---|---|---|---|---|---|---|---|---|
catboost | \n", "CatBoost Regressor | \n", "30581.5747 | \n", "2.127545e+09 | \n", "46106.7110 | \n", "0.8401 | \n", "0.2292 | \n", "0.1713 | \n", "6.092 | \n", "
lightgbm | \n", "Light Gradient Boosting Machine | \n", "32080.4953 | \n", "2.288939e+09 | \n", "47825.1154 | \n", "0.8280 | \n", "0.2368 | \n", "0.1803 | \n", "0.380 | \n", "
xgboost | \n", "Extreme Gradient Boosting | \n", "32319.8227 | \n", "2.360399e+09 | \n", "48565.5055 | \n", "0.8226 | \n", "0.2402 | \n", "0.1802 | \n", "5.276 | \n", "
rf | \n", "Random Forest Regressor | \n", "32380.6304 | \n", "2.443352e+09 | \n", "49413.7604 | \n", "0.8163 | \n", "0.2402 | \n", "0.1813 | \n", "10.390 | \n", "
et | \n", "Extra Trees Regressor | \n", "35610.3678 | \n", "2.838177e+09 | \n", "53259.6912 | \n", "0.7867 | \n", "0.2571 | \n", "0.2000 | \n", "3.562 | \n", "
gbr | \n", "Gradient Boosting Regressor | \n", "38546.1402 | \n", "3.081754e+09 | \n", "55499.7261 | \n", "0.7684 | \n", "0.2724 | \n", "0.2172 | \n", "2.442 | \n", "
knn | \n", "K Neighbors Regressor | \n", "42437.8477 | \n", "3.907490e+09 | \n", "62500.9859 | \n", "0.7063 | \n", "0.2950 | \n", "0.2307 | \n", "0.312 | \n", "
ridge | \n", "Ridge Regression | \n", "49215.7203 | \n", "4.616907e+09 | \n", "67944.2328 | \n", "0.6531 | \n", "0.3706 | \n", "0.2857 | \n", "0.056 | \n", "
lr | \n", "Linear Regression | \n", "49213.1812 | \n", "4.617130e+09 | \n", "67946.0641 | \n", "0.6531 | \n", "0.3706 | \n", "0.2857 | \n", "0.896 | \n", "
lasso | \n", "Lasso Regression | \n", "49213.9734 | \n", "4.617133e+09 | \n", "67946.0688 | \n", "0.6531 | \n", "0.3706 | \n", "0.2857 | \n", "0.086 | \n", "
llar | \n", "Lasso Least Angle Regression | \n", "49199.5742 | \n", "4.617416e+09 | \n", "67948.4755 | \n", "0.6531 | \n", "0.3648 | \n", "0.2850 | \n", "0.054 | \n", "
br | \n", "Bayesian Ridge | \n", "49219.0580 | \n", "4.618043e+09 | \n", "67952.4290 | \n", "0.6530 | \n", "0.3706 | \n", "0.2857 | \n", "0.062 | \n", "
dt | \n", "Decision Tree Regressor | \n", "43745.8735 | \n", "4.671816e+09 | \n", "68330.6820 | \n", "0.6489 | \n", "0.3266 | \n", "0.2419 | \n", "0.248 | \n", "
huber | \n", "Huber Regressor | \n", "47852.7348 | \n", "4.747789e+09 | \n", "68899.4894 | \n", "0.6433 | \n", "0.3588 | \n", "0.2607 | \n", "0.494 | \n", "
par | \n", "Passive Aggressive Regressor | \n", "47800.1742 | \n", "4.854553e+09 | \n", "69669.4181 | \n", "0.6353 | \n", "0.3531 | \n", "0.2539 | \n", "0.930 | \n", "
lar | \n", "Least Angle Regression | \n", "51104.6761 | \n", "4.987058e+09 | \n", "70467.8720 | \n", "0.6246 | \n", "0.3926 | \n", "0.2960 | \n", "0.058 | \n", "
en | \n", "Elastic Net | \n", "58414.0102 | \n", "5.969090e+09 | \n", "77253.8500 | \n", "0.5516 | \n", "0.3961 | \n", "0.3676 | \n", "0.064 | \n", "
omp | \n", "Orthogonal Matching Pursuit | \n", "62498.9386 | \n", "6.998824e+09 | \n", "83650.4437 | \n", "0.4742 | \n", "0.4274 | \n", "0.3862 | \n", "0.056 | \n", "
ada | \n", "AdaBoost Regressor | \n", "73019.0208 | \n", "7.434027e+09 | \n", "86129.4616 | \n", "0.4423 | \n", "0.4575 | \n", "0.4953 | \n", "1.124 | \n", "
dummy | \n", "Dummy Regressor | \n", "91134.4797 | \n", "1.331817e+10 | \n", "115399.7062 | \n", "-0.0004 | \n", "0.5902 | \n", "0.6218 | \n", "0.038 | \n", "
\n", " | MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|
0 | \n", "32293.8649 | \n", "2.361319e+09 | \n", "48593.4073 | \n", "0.8235 | \n", "0.2471 | \n", "0.1904 | \n", "
1 | \n", "31843.9485 | \n", "2.250754e+09 | \n", "47442.1102 | \n", "0.8383 | \n", "0.2388 | \n", "0.1800 | \n", "
2 | \n", "31348.3474 | \n", "2.181586e+09 | \n", "46707.4544 | \n", "0.8319 | \n", "0.2336 | \n", "0.1756 | \n", "
3 | \n", "31826.7910 | \n", "2.110376e+09 | \n", "45938.8300 | \n", "0.8486 | \n", "0.2205 | \n", "0.1700 | \n", "
4 | \n", "31266.5081 | \n", "2.022385e+09 | \n", "44970.9387 | \n", "0.8453 | \n", "0.2255 | \n", "0.1753 | \n", "
5 | \n", "32285.9929 | \n", "2.347666e+09 | \n", "48452.7200 | \n", "0.8280 | \n", "0.2389 | \n", "0.1799 | \n", "
6 | \n", "32917.5026 | \n", "2.481263e+09 | \n", "49812.2748 | \n", "0.8023 | \n", "0.2478 | \n", "0.1900 | \n", "
7 | \n", "32016.6061 | \n", "2.443503e+09 | \n", "49431.8047 | \n", "0.8212 | \n", "0.2366 | \n", "0.1761 | \n", "
8 | \n", "32510.1652 | \n", "2.372810e+09 | \n", "48711.4953 | \n", "0.8124 | \n", "0.2396 | \n", "0.1825 | \n", "
9 | \n", "31974.8665 | \n", "2.182846e+09 | \n", "46720.9401 | \n", "0.8361 | \n", "0.2368 | \n", "0.1820 | \n", "
Mean | \n", "32028.4593 | \n", "2.275451e+09 | \n", "47678.1976 | \n", "0.8288 | \n", "0.2365 | \n", "0.1802 | \n", "
SD | \n", "477.4988 | \n", "1.421110e+08 | \n", "1496.7863 | \n", "0.0137 | \n", "0.0081 | \n", "0.0061 | \n", "
\n", " | MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|
0 | \n", "30749.6800 | \n", "2.208185e+09 | \n", "46991.3237 | \n", "0.8350 | \n", "0.2414 | \n", "0.1793 | \n", "
1 | \n", "31013.1597 | \n", "2.199479e+09 | \n", "46898.6031 | \n", "0.8420 | \n", "0.2391 | \n", "0.1744 | \n", "
2 | \n", "30048.7226 | \n", "2.010211e+09 | \n", "44835.3716 | \n", "0.8451 | \n", "0.2278 | \n", "0.1662 | \n", "
3 | \n", "29760.2153 | \n", "1.906170e+09 | \n", "43659.7098 | \n", "0.8632 | \n", "0.2192 | \n", "0.1596 | \n", "
4 | \n", "29536.5488 | \n", "1.821557e+09 | \n", "42679.7016 | \n", "0.8607 | \n", "0.2190 | \n", "0.1662 | \n", "
5 | \n", "31421.1801 | \n", "2.227955e+09 | \n", "47201.2160 | \n", "0.8367 | \n", "0.2352 | \n", "0.1751 | \n", "
6 | \n", "31475.3666 | \n", "2.331154e+09 | \n", "48282.0287 | \n", "0.8142 | \n", "0.2417 | \n", "0.1786 | \n", "
7 | \n", "31164.0971 | \n", "2.321773e+09 | \n", "48184.7804 | \n", "0.8301 | \n", "0.2357 | \n", "0.1724 | \n", "
8 | \n", "31911.1972 | \n", "2.285065e+09 | \n", "47802.3519 | \n", "0.8193 | \n", "0.2416 | \n", "0.1781 | \n", "
9 | \n", "31162.4877 | \n", "2.108047e+09 | \n", "45913.4701 | \n", "0.8417 | \n", "0.2320 | \n", "0.1748 | \n", "
Mean | \n", "30824.2655 | \n", "2.141959e+09 | \n", "46244.8557 | \n", "0.8388 | \n", "0.2333 | \n", "0.1725 | \n", "
SD | \n", "749.9779 | \n", "1.674689e+08 | \n", "1836.5230 | \n", "0.0149 | \n", "0.0083 | \n", "0.0061 | \n", "
\n", " | Model | \n", "MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "Light Gradient Boosting Machine | \n", "30322.3775 | \n", "2.143047e+09 | \n", "46293.0577 | \n", "0.839 | \n", "0.2286 | \n", "0.1676 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity_INLAND | \n", "ocean_proximity_ISLAND | \n", "ocean_proximity_NEAR BAY | \n", "ocean_proximity_NEAR OCEAN | \n", "ocean_proximity__1H OCEAN | \n", "income_cat_1 | \n", "income_cat_2 | \n", "income_cat_3 | \n", "income_cat_4 | \n", "income_cat_5 | \n", "median_house_value | \n", "Label | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.763088 | \n", "-0.843765 | \n", "-0.603827 | \n", "1.022574 | \n", "0.272975 | \n", "0.754521 | \n", "0.399176 | \n", "1.625053 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "329700.0 | \n", "352962.868246 | \n", "
1 | \n", "0.295082 | \n", "-0.115727 | \n", "1.143888 | \n", "-0.188764 | \n", "-0.345319 | \n", "-0.467342 | \n", "-0.327754 | \n", "0.076504 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "90400.0 | \n", "121376.713808 | \n", "
2 | \n", "-0.944645 | \n", "1.359017 | \n", "1.858862 | \n", "-0.830114 | \n", "-0.762254 | \n", "-0.956957 | \n", "-0.828816 | \n", "-0.533359 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "125000.0 | \n", "110374.026417 | \n", "
3 | \n", "0.563938 | \n", "-0.680424 | \n", "-1.398243 | \n", "-0.073312 | \n", "0.858105 | \n", "0.903232 | \n", "0.921007 | \n", "-0.861554 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "181300.0 | \n", "189637.026738 | \n", "
4 | \n", "1.997834 | \n", "-1.310456 | \n", "0.031705 | \n", "-0.651481 | \n", "-0.560893 | \n", "-0.542132 | \n", "-0.551025 | \n", "-1.004427 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "61100.0 | \n", "58507.770016 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
4123 | \n", "-1.447502 | \n", "0.994997 | \n", "1.382213 | \n", "0.301680 | \n", "0.602259 | \n", "0.309258 | \n", "0.718505 | \n", "-0.135740 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "352200.0 | \n", "382938.152134 | \n", "
4124 | \n", "0.917433 | \n", "-0.736426 | \n", "1.064446 | \n", "-0.061948 | \n", "0.036081 | \n", "0.106629 | \n", "0.022730 | \n", "-0.441770 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "135700.0 | \n", "131752.359849 | \n", "
4125 | \n", "-1.337968 | \n", "0.850324 | \n", "1.223329 | \n", "0.173501 | \n", "-0.153435 | \n", "-0.167312 | \n", "-0.060348 | \n", "1.480141 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "495900.0 | \n", "454350.082800 | \n", "
4126 | \n", "-0.720596 | \n", "0.948328 | \n", "-0.127178 | \n", "-0.311034 | \n", "-0.499301 | \n", "-0.368202 | \n", "-0.501698 | \n", "-0.046399 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "110500.0 | \n", "135116.934250 | \n", "
4127 | \n", "0.703344 | \n", "-0.811097 | \n", "1.064446 | \n", "-0.811023 | \n", "-0.878332 | \n", "-0.590833 | \n", "-0.792470 | \n", "-0.038923 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "145800.0 | \n", "126458.427121 | \n", "
4128 rows × 20 columns
\n", "\n", " | Model | \n", "MAE | \n", "MSE | \n", "RMSE | \n", "R2 | \n", "RMSLE | \n", "MAPE | \n", "
---|---|---|---|---|---|---|---|
0 | \n", "Light Gradient Boosting Machine | \n", "15646.0204 | \n", "5.287845e+08 | \n", "22995.315 | \n", "0.9603 | \n", "0.125 | \n", "0.0894 | \n", "
\n", " | longitude | \n", "latitude | \n", "housing_median_age | \n", "total_rooms | \n", "total_bedrooms | \n", "population | \n", "households | \n", "median_income | \n", "ocean_proximity_INLAND | \n", "ocean_proximity_ISLAND | \n", "ocean_proximity_NEAR BAY | \n", "ocean_proximity_NEAR OCEAN | \n", "ocean_proximity__1H OCEAN | \n", "income_cat_1 | \n", "income_cat_2 | \n", "income_cat_3 | \n", "income_cat_4 | \n", "income_cat_5 | \n", "median_house_value | \n", "Label | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.763088 | \n", "-0.843765 | \n", "-0.603827 | \n", "1.022574 | \n", "0.272975 | \n", "0.754521 | \n", "0.399176 | \n", "1.625053 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "329700.0 | \n", "342728.901139 | \n", "
1 | \n", "0.295082 | \n", "-0.115727 | \n", "1.143888 | \n", "-0.188764 | \n", "-0.345319 | \n", "-0.467342 | \n", "-0.327754 | \n", "0.076504 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "90400.0 | \n", "93738.667987 | \n", "
2 | \n", "-0.944645 | \n", "1.359017 | \n", "1.858862 | \n", "-0.830114 | \n", "-0.762254 | \n", "-0.956957 | \n", "-0.828816 | \n", "-0.533359 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "125000.0 | \n", "119828.621400 | \n", "
3 | \n", "0.563938 | \n", "-0.680424 | \n", "-1.398243 | \n", "-0.073312 | \n", "0.858105 | \n", "0.903232 | \n", "0.921007 | \n", "-0.861554 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "181300.0 | \n", "182700.035854 | \n", "
4 | \n", "1.997834 | \n", "-1.310456 | \n", "0.031705 | \n", "-0.651481 | \n", "-0.560893 | \n", "-0.542132 | \n", "-0.551025 | \n", "-1.004427 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "61100.0 | \n", "51104.290583 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
4123 | \n", "-1.447502 | \n", "0.994997 | \n", "1.382213 | \n", "0.301680 | \n", "0.602259 | \n", "0.309258 | \n", "0.718505 | \n", "-0.135740 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "352200.0 | \n", "370818.956642 | \n", "
4124 | \n", "0.917433 | \n", "-0.736426 | \n", "1.064446 | \n", "-0.061948 | \n", "0.036081 | \n", "0.106629 | \n", "0.022730 | \n", "-0.441770 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "135700.0 | \n", "133249.086305 | \n", "
4125 | \n", "-1.337968 | \n", "0.850324 | \n", "1.223329 | \n", "0.173501 | \n", "-0.153435 | \n", "-0.167312 | \n", "-0.060348 | \n", "1.480141 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "495900.0 | \n", "486451.087129 | \n", "
4126 | \n", "-0.720596 | \n", "0.948328 | \n", "-0.127178 | \n", "-0.311034 | \n", "-0.499301 | \n", "-0.368202 | \n", "-0.501698 | \n", "-0.046399 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "110500.0 | \n", "132233.433352 | \n", "
4127 | \n", "0.703344 | \n", "-0.811097 | \n", "1.064446 | \n", "-0.811023 | \n", "-0.878332 | \n", "-0.590833 | \n", "-0.792470 | \n", "-0.038923 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "145800.0 | \n", "139946.427235 | \n", "
4128 rows × 20 columns
\n", "